@book{rawlings_model_2017,
  address   = {Madison, USA},
  author    = {Rawlings, James Blake and Mayne, David Q. and Diehl, Moritz},
  edition   = {2},
  publisher = {Nob Hill Publishing},
  title     = {Model Predictive Control: Theory, Computation, and Design},
  year      = {2018},
}

@book{sutton_reinforcement_2018,
  author={Sutton, Richard S. and Barto, Andrew G.},
  publisher={MIT press},
  title={Reinforcement learning: An introduction},
  year={2018},
}

@book{nocedal_numerical_2006,
  author={Nocedal, Jorge and Wright, Stephen J.},
  publisher={Springer},
  title={Numerical Optimization},
  year={2006},
}

@inproceedings{esfahani_approximate_2021,
  author    = {Esfahani, Hossein Nejatbakhsh and Kordabad, Arash Bahari and Gros, S{\'e}bastien},
  booktitle = {2021 European Control Conference (ECC)},
  title     = {Approximate Robust {NMPC} using Reinforcement Learning},
  year      = {2021},
  volume    = {},
  number    = {},
  pages     = {132-137},
}

@inproceedings{cai_mpcbased_2021,
  author    = {Cai, Wenqi and Kordabad, Arash B. and Esfahani, Hossein N. and Lekkas, Anastasios M. and Gros, S{\'e}bastien},
  booktitle = {2021 60th IEEE Conference on Decision and Control (CDC)},
  title     = {{MPC}-based Reinforcement Learning for a Simplified Freight Mission of Autonomous Surface Vehicles},
  year      = {2021},
  volume    = {},
  number    = {},
  pages     = {2990-2995},
 }

@article{gros_datadriven_2020,
  author  = {Gros, S{\'e}bastien and Zanon, Mario},
  journal = {IEEE Transactions on Automatic Control},
  title   = {Data-Driven Economic {NMPC} Using Reinforcement Learning},
  year    = {2020},
  volume  = {65},
  number  = {2},
  pages   = {636-648},
}

@book{garnett_bayesoptbook_2023,
  author    = {Garnett, Roman},
  publisher = {Cambridge University Press},
  title     = {Bayesian Optimization},
  year      = {2023},
}

@article{zanon_safe_2021,
  author  = {Zanon, Mario and Gros, S{\'e}bastien},
  journal = {IEEE Transactions on Automatic Control},
  number  = {8},
  pages   = {3638-3652},
  title   = {Safe Reinforcement Learning Using Robust {MPC}},
  volume  = {66},
  year    = {2021}
}

@article{gros_learning_2022,
  author  = {S{\'e}bastien Gros and Mario Zanon},
  journal = {Automatica},
  pages   = {110598},
  title   = {Learning for {MPC} with stability \& safety guarantees},
  volume  = {146},
  year    = {2022}
}

@article{gros_towards_2019,
  author       = {S{\'e}bastien Gros and Mario Zanon},
  title        = {Towards Safe Reinforcement Learning Using {NMPC} and Policy Gradients: Part {II} - Deterministic Case},
  journal      = {CoRR},
  volume       = {abs/1906.04034},
  year         = {2019},
  url          = {http://arxiv.org/abs/1906.04034},
  eprinttype    = {arXiv},
  eprint       = {1906.04034},
}

@inproceedings{gros_reinforcement_2021,
  author    = {Gros, S{\'e}bastien and Zanon, Mario},
  booktitle = {2021 American Control Conference (ACC)},
  title     = {Reinforcement Learning based on MPC and the Stochastic Policy Gradient Method},
  year      = {2021},
  volume    = {},
  number    = {},
  pages     = {1947-1952},
}

@inproceedings{sutskever_importance_2013,
  title     = {On the importance of initialization and momentum in deep learning},
  author    = {Sutskever, Ilya and Martens, James and Dahl, George and Hinton, Geoffrey},
  booktitle = {Proceedings of the 30th International Conference on Machine Learning},
  pages     = {1139--1147},
  year      = {2013},
  editor    = {Dasgupta, Sanjoy and McAllester, David},
  volume    = {28},
  number    = {3},
  series    = {Proceedings of Machine Learning Research},
  address   = {Atlanta, Georgia, USA},
  month     = {17--19 Jun},
  publisher = {PMLR},
}

@article{reddi_convergence_2019,
  title   = {On the convergence of {Adam} and beyond},
  author  = {Reddi, Sashank J. and Kale, Satyen and Kumar, Sanjiv},
  journal = {arXiv preprint arXiv:1904.09237},
  year    = {2019}
}

@article{loshchilov_decoupled_2017,
  title   = {Decoupled weight decay regularization},
  author  = {Loshchilov, Ilya and Hutter, Frank},
  journal = {arXiv preprint arXiv:1711.05101},
  year    = {2017}
}

@article{kingma_adam_2014,
  title   = {{Adam}: A method for stochastic optimization},
  author  = {Kingma, Diederik P. and Ba, Jimmy},
  journal = {arXiv preprint arXiv:1412.6980},
  year    = {2014}
}

@article{hinton_neural_2012,
  title={Neural networks for machine learning },
  author={Hinton, Geoffrey and Srivastava, Nitish and Swersky, Kevin},
  journal={Lecture 6a: Overview of mini-batch gradient descent},
  volume={6a},
  pages={31},
  year={2012}
}

@incollection{buskens_sensitivity_2001,
  address   = {Berlin, Heidelberg},
  author    = {B{\"u}skens, Christof and Maurer, Helmut},
  booktitle = {Online Optimization of Large Scale Systems},
  editor    = {Gr{\"o}tschel, Martin and Krumke, Sven O. and Rambau, J{\"o}rg},
  pages     = {3--16},
  publisher = {Springer},
  title     = {Sensitivity Analysis and Real-Time Optimization of Parametric Nonlinear Programming Problems},
  year      = {2001},
}
